# 读取文件生成../ad_data, 生成1w_tokenized_unitid文件，key 是ad_id value是ad embeding
import os
from tqdm import tqdm
import json
import numpy as np

if __name__ == '__main__':
    ad_embedding = {}
    with open('../ad_data', 'r') as f:
        for line in f:
            data = json.loads(line)
            ad_embedding[str(data['ad_id'])] = np.array(data['ad_embedding'])
